#coding=utf-8
#游戏名称
gamename="MountainCar-v0"
#采集场景数
max_episode=200
#采集步数
maxSteps=80000
#内存存储的最大元组数
storageMaxSize=1000000
#当采集到的元组数量达到开始训练的边界时，开始训练
startTrainSize=0.01*storageMaxSize
#训练时的迭代次数
train_iter_number=15000
#batchsize
batchSize=32
#折扣率
discount=0.7
#确定网络更新的频率
updateStep=15000
#state空间的维数
stateSize=2
#acton空间的维数
actionSize=3

epStart=1.0
epEnd=0.3

saveVersion=1.1
saveModelPath="checkpoints/"+gamename+"-"+str(saveVersion)+"/model/"
saveModelStep=50000
model=None

logName=gamename+"-"+str(saveVersion)

learning_rate = 0.001
learning_rate_minimum = 0.0001
learning_rate_decay = 0.96
learning_rate_decay_step = 20000

train_flag=True

train_render_flag=False
